% This file was created with JabRef 2.6.
% Encoding: Cp1252

@INCOLLECTION{WGPGPU,
  author = {Collocated with ASPLOS '10},
  title = {3rd Workshop on General-Purpose Computation on Graphic Processing
	Units},
  booktitle = {WINDS},
  publisher = {ACM},
  year = {2010},
  file = {:D\:\\paper\\GPGPU\\GPGPU-Proceedings.pdf:PDF},
  owner = {jouyang},
  timestamp = {2011.09.22}
}

@INPROCEEDINGS{micro43:GPU_NoC,
  author = {Bakhoda, Ali and Kim, John and Aamodt, Tor M.},
  title = {Throughput-Effective On-Chip Networks for Manycore Accelerators},
  booktitle = {Proceedings of the 2010 43rd Annual IEEE/ACM International Symposium
	on Microarchitecture},
  year = {2010},
  series = {MICRO '43},
  pages = {421--432},
  address = {Washington, DC, USA},
  publisher = {IEEE Computer Society},
  acmid = {1934987},
  doi = {http://dx.doi.org/10.1109/MICRO.2010.50},
  file = {:D\:\\paper\\GPGPU\\bakhoda.micro43.pdf:PDF},
  isbn = {978-0-7695-4299-7},
  keywords = {NoC, Compute accelerator, GPGPU},
  numpages = {12},
  owner = {jouyang},
  timestamp = {2011.09.01},
  url = {http://dx.doi.org/10.1109/MICRO.2010.50}
}

@INPROCEEDINGS{ip09:gpgpu-sim,
  author = {Bakhoda, A. and Yuan, G.L. and Fung, W.W.L. and Wong, H. and Aamodt,
	T.M.},
  title = {Analyzing CUDA workloads using a detailed GPU simulator},
  booktitle = {Performance Analysis of Systems and Software, 2009. ISPASS 2009.
	IEEE International Symposium on},
  year = {2009},
  pages = {163 -174},
  month = {april},
  doi = {10.1109/ISPASS.2009.4919648},
  file = {:D\:\\paper\\GPGPU\\2009-ISPASS-GPGPU-sim.pdf:PDF},
  keywords = {CUDA programming;CUDA workload;GPU hardware;GPU simulator;caches;flexible
	programming model;graphic processing unit;high-end graphics card;interconnect
	topology;memory controller;memory request coalescing hardware;microarchitecture
	design;microarchitecture performance simulator;parallel thread execution;parallel
	workload distribution;virtual instruction set;cache storage;computer
	graphic equipment;instruction sets;multi-threading;multiprocessing
	systems;parallel architectures;},
  owner = {jouyang},
  timestamp = {2011.09.22}
}

@INPROCEEDINGS{rodinia,
  author = {Shuai Che and Sheaffer, J.W. and Boyer, M. and Szafaryn, L.G. and
	Liang Wang and Skadron, K.},
  title = {A characterization of the Rodinia benchmark suite with comparison
	to contemporary CMP workloads},
  booktitle = {Workload Characterization (IISWC), 2010 IEEE International Symposium
	on},
  year = {2010},
  pages = {1 -11},
  month = {dec.},
  doi = {10.1109/IISWC.2010.5650274},
  file = {:D\:\\paper\\GPGPU\\rodinia_iiswc10.pdf:PDF},
  keywords = {GPU;NVIDIA GeForce GTX480;Parsec;Rodinia benchmark suite;contemporary
	CMP workloads;graphics processors unit;principal component analysis;space
	coverage;computer graphics;coprocessors;principal component analysis;},
  owner = {jouyang},
  timestamp = {2011.09.23}
}

@INPROCEEDINGS{SC11:Dymaxion,
  author = {Shuai Che and Jeremy W. Sheaffer and Kevin Skadron},
  title = {Dymaxion: Optimizing Memory Access Patterns for Heterogeneous Systems},
  booktitle = {Supercomputing '11},
  year = {2011},
  file = {:D\:\\paper\\GPGPU\\sc11_dymaxion_dist.pdf:PDF},
  owner = {jouyang},
  timestamp = {2011.09.22}
}

@INPROCEEDINGS{HPCA11:thread_block_compaction,
  author = {Wilson W. L. Fung and Tor M. Aamodt},
  title = {Thread Block Compaction for Efficient SIMT Control Flow},
  booktitle = {HPCA '11},
  year = {2011},
  file = {:D\:\\paper\\GPGPU\\wwlfung.hpca2011.pdf:PDF},
  owner = {jouyang},
  timestamp = {2011.09.22}
}

@INPROCEEDINGS{SIGGRAPH08:Larrabee,
  author = {Seiler, Larry and Carmean, Doug and Sprangle, Eric and Forsyth, Tom
	and Abrash, Michael and Dubey, Pradeep and Junkins, Stephen and Lake,
	Adam and Sugerman, Jeremy and Cavin, Robert and Espasa, Roger and
	Grochowski, Ed and Juan, Toni and Hanrahan, Pat},
  title = {Larrabee: a many-core x86 architecture for visual computing},
  booktitle = {ACM SIGGRAPH 2008 papers},
  year = {2008},
  series = {SIGGRAPH '08},
  pages = {18:1--18:15},
  address = {New York, NY, USA},
  publisher = {ACM},
  acmid = {1360617},
  articleno = {18},
  doi = {http://doi.acm.org/10.1145/1399504.1360617},
  file = {:D\:\\paper\\GPGPU\\larrabee_manycore.pdf:PDF},
  isbn = {978-1-4503-0112-1},
  keywords = {GPGPU, SIMD, graphics architecture, many-core computing, parallel
	processing, realtime graphics, software rendering, throughput computing,
	visual computing},
  location = {Los Angeles, California},
  numpages = {15},
  owner = {jouyang},
  timestamp = {2011.09.22},
  url = {http://doi.acm.org/10.1145/1399504.1360617}
}

@INPROCEEDINGS{ISCA11:Moguls,
  author = {Sun, Guangyu and Hughes, Christopher J. and Kim, Changkyu and Zhao,
	Jishen and Xu, Cong and Xie, Yuan and Chen, Yen-Kuang},
  title = {Moguls: a model to explore the memory hierarchy for bandwidth improvements},
  booktitle = {Proceeding of the 38th annual international symposium on Computer
	architecture},
  year = {2011},
  series = {ISCA '11},
  pages = {377--388},
  address = {New York, NY, USA},
  publisher = {ACM},
  acmid = {2000109},
  doi = {http://doi.acm.org/10.1145/2000064.2000109},
  file = {:D\:\\paper\\GPGPU\\Moguls-Guangyu.pdf:PDF},
  isbn = {978-1-4503-0472-6},
  keywords = {bandwidth, memory hierarchy, memory model, power consumption, throughput
	computing},
  location = {San Jose, California, USA},
  numpages = {12},
  owner = {jouyang},
  timestamp = {2011.09.22},
  url = {http://doi.acm.org/10.1145/2000064.2000109}
}

@INPROCEEDINGS{PLDI07:EXOCHI,
  author = {Wang, Perry H. and Collins, Jamison D. and Chinya, Gautham N. and
	Jiang, Hong and Tian, Xinmin and Girkar, Milind and Yang, Nick Y.
	and Lueh, Guei-Yuan and Wang, Hong},
  title = {EXOCHI: architecture and programming environment for a heterogeneous
	multi-core multithreaded system},
  booktitle = {Proceedings of the 2007 ACM SIGPLAN conference on Programming language
	design and implementation},
  year = {2007},
  series = {PLDI '07},
  pages = {156--166},
  address = {New York, NY, USA},
  publisher = {ACM},
  acmid = {1250753},
  doi = {http://doi.acm.org/10.1145/1250734.1250753},
  file = {:D\:\\paper\\GPGPU\\PLDI07-Intel-EXOCHI_heterogeneous_platform.pdf:PDF},
  isbn = {978-1-59593-633-2},
  keywords = {GPU, heterogeneous multi-cores, openMP},
  location = {San Diego, California, USA},
  numpages = {11},
  owner = {jouyang},
  timestamp = {2011.09.22},
  url = {http://doi.acm.org/10.1145/1250734.1250753}
}

@MASTERSTHESIS{UBC:GPU-CPU,
  author = {Henry Ting-Hei Wong},
  title = {Architectures and Limits of GPU-CPU Heterogeneous Systems},
  school = {University of British Columbia},
  year = {2008},
  file = {:D\:\\paper\\GPGPU\\heterogeneous_limits_ubc_2008_fall_wong_henry.pdf:PDF},
  owner = {jouyang},
  timestamp = {2011.09.22}
}

@comment{jabref-meta: selector_publisher:}

@comment{jabref-meta: selector_author:}

@comment{jabref-meta: selector_journal:}

@comment{jabref-meta: selector_keywords:}

